for (i=o; i<n; 

y[i] = x[i] + 1; 



II 

mov pr.rot =0 // Clear all rotating predicate registers 

cmp.eq p16,p0 = rO.rO // Set pi 6=1 

mov ar.lc = 4 //Set loop counter to n-1 

mov ar.ec = 3 // Set epilog counter to 3 

// loop 
loop: 

(p16) Idl r32 = [r12],1 // Stage 1: load x 

(pi 7) add r34 = 1,r33 // Stage 2: y=x+1 

(pi 8) stl [r13] = r35,1 // Stage 3: store y 

br.ctop.sptk.few loop // Branch back 



// loop 
loop: 

f(p16) Idl r32 = [r12],1 
mo) (p17) add r34 = 1/33 
(Jp18) stl [r13] = r35,1 

// loop 

r(p63) Idl r127 = [r12],1 

m) (p16) add r33 = 1,r32 

(>17) stl [r13] = r34,1 

// loop 

f(p62) Idl r126 = [r12],1 

m )(p63) add r32 = 1,r127 

(jp16) stl [r13] = r33,1 

// loop 

f(p61) Idl r125 - [r12],1 

Mi (p62) add r31 - 1/126 

(( P 63) stl [r13] = r32,1 



// Stage 1: load x 
// Stage 2: y=x+1 
// Stage 3: store y 

// Stage 1: load x 
// Stage 2: y=x+1 
// Stage 3: store y 

// Stage 1: load x 
// Stage 2: y=x+1 
// Stage 3: store y 

// Stage 1: load x 
//Stage 2: y=x+1 
// Stage 3: store y 
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